Load all relevant R libraries.
# Load Libraries
library("RPostgres")
library("ggplot2")
library("tidyverse")
library("dbplyr")
library("lubridate")
library("data.table")
library("dtplyr")
library("ggpubr")
library("muStat")
library("mvnormtest")
library("knitr")
library("kableExtra")
# load the PostgreSQL driver
drv <- dbDriver("Postgres")
# create a connection to the postgres database
# set the search path to the mimiciii schema
con <- dbConnect(drv, dbname = "mimic",
host = "localhost", port = 5432,
user = "mousaghannam")
dbSendQuery(con, 'set search_path to mimiciii')
<PqResult>
SQL set search_path to mimiciii
ROWS Fetched: 0 [complete]
Changed: 0
# show a list of tables
dbListTables(con)
Closing open result set, cancelling previous query
[1] "chartevents_8" "admissions" "callout" "caregivers"
[5] "chartevents_1" "chartevents_2" "chartevents_3" "chartevents_4"
[9] "chartevents_5" "chartevents_6" "chartevents_7" "chartevents_9"
[13] "chartevents_10" "chartevents_11" "icustays" "inputevents_cv"
[17] "inputevents_mv" "labevents" "microbiologyevents" "chartevents_12"
[21] "chartevents_13" "chartevents_14" "chartevents" "chartevents_15"
[25] "chartevents_16" "chartevents_17" "cptevents" "datetimeevents"
[29] "diagnoses_icd" "drgcodes" "d_cpt" "d_icd_diagnoses"
[33] "prescriptions" "services" "d_icd_procedures" "d_items"
[37] "d_labitems" "noteevents" "outputevents" "patients"
[41] "procedureevents_mv" "procedures_icd" "transfers"
This is a memory conservative approaching for performing SQL queries on DB. We can pull tables in memory and do certain analyses on them, without actually having to save a given object into the R environment.
#Memory conserative approaching for performing SQL queries on DB
#(Rewrite this function to handle multiple inputs )
tbl_mimic <- function(table) {
table <- as.character(substitute(table))
tbl(con, dbplyr::in_schema("mimiciii", table))
}
This “dictionary” will contain all of the diagnoses events in the database associated with a given hospital admission id (hadm_id), along with a description of the icd9 code.
#Pull dictionary for diagnoses
d_icd_diagnoses <- tbl_mimic(d_icd_diagnoses) %>%
select(icd9_code, short_title)
diagnoses_icd <-tbl_mimic(diagnoses_icd) %>%
select(hadm_id, icd9_code, seq_num)
#ICD-9 Codes + their descriptions
icd9_dict <- diagnoses_icd %>%
inner_join(d_icd_diagnoses, by = "icd9_code")
icd9_dict
Saved all of the lab_ids into R environment with collect(), for filtering in the next step.
We are choosing to include the 1st and 4th row, which are strictly blood lab value draws for potassium.
#Drugs to include for potassium
itemidsK <- lab_idsK$itemid[c(1,4)]
We are now taking the table labevents, which contains all the lab events in the database, and selecting the rows associated with the two blood potassium lab values itemids that we chose above.
labevents <- tbl_mimic(labevents)
labevents %>%
filter(itemid %in% itemidsK) %>%
inner_join(select(tbl_mimic(d_labitems),-loinc_code, -row_id ), by = "itemid") %>%
select(subject_id, hadm_id, itemid, charttime, valuenum, valueuom, label, flag, fluid, category) -> labEventsK
labEventsK %>% count() %>% collect() -> numLabKevents
labEventsK
print(paste(" There are ",pull(numLabKevents[1,1]), " total potassium lab values that were extracted from the labevents table." ))
[1] " There are 1038686 total potassium lab values that were extracted from the labevents table."
The d_items table in mimics contains a dictionary for all of the events associated with both the metaview and careview database. We are only going to focus on the metaview database at this point. We then want to filter this table by the label description for items that are related to potassium.
d_items <- tbl_mimic(d_items) #Pull dictionary for all lab events into memory
d_items %>%
filter(label %ilike% "%potassium%" | label %ilike% "%kcl%") %>%
filter(str_detect(tolower(dbsource), "meta")) %>%
arrange(label) -> k_items_MV
k_items_MV
NA
Although there are events sourced from either metaview or careview, these two hospital databases are actually linked to 3 different tables in the mimics database: inputevents_mv, inputevents_cv or chartevents. Since we are examining only the metavision database, it will only link to inputevents_mv and chartevents. We would like to select for only the events that link to inputevents_mv.
k_items_MV %>%
filter(linksto=="inputevents_mv") %>% collect() -> k_items_MV_IM
k_items_MV_IM
If you look at the above table, the first row has a KCL (Bolus) with unit mL, while the 5th row has Potassium Chloride with units in mEq. According to the mimics iii website:
“Metavision records IO data using two tables: RANGESIGNALS and ORDERENTRY. These tables do not appear in MIMIC-III as they have been merged to form the > INPUTEVENTS_MV table. RANGESIGNALS contains recorded data elements which last for a fixed period of time. Furthermore, the RANGESIGNALS table recorded > information for each component of the drug separately. For example, for a norepinephrine administration there would be two components: a main order > component (norepinephrine) and a solution component (NaCl).” 1
Therefore, we will only be selecting repletions based off of the “main order component”, and ignoring the solution. We will select for the 4th and 5th rows, which correspond to Potassiume Acetate and Potassium Chloride.
k_items_MV_IM %>% slice(-6,-3, -2,-1) -> k_items_MV_IM #ONLY KEEPING THE REPLETIONS, THE ADDITIVE AMOUNTS, NOT THE BOLUS
k_items_MV_IM
k_items_MV_IM %>% pull(itemid) -> k_items_MV_IM_vector
We will now use the filtered ids for the two additive solutions above to pull electrolyte repletions from the inputevents_mv table.
inputevents_mv <- tbl_mimic(inputevents_mv)
inputevents_mv %>%
filter(itemid %in% k_items_MV_IM_vector) %>%
select(subject_id, hadm_id,icustay_id, linkorderid, orderid, itemid, starttime, endtime, amount, amountuom, rate, rateuom, statusdescription, ordercomponenttypedescription) %>%
filter(!statusdescription == "Rewritten") %>%
rename(itemid.repletion = itemid) -> repEventsK
repEventsK
Determine the amount of potassium repletions:
repEventsK %>% count() %>% collect() -> numKRepletions
print(paste(" There are ",pull(numKRepletions[1,1]), " total potassium repletions that were extracted from the inputevents_mv table." ))
[1] " There are 66429 total potassium repletions that were extracted from the inputevents_mv table."
Both the tables containing the lab draws and the repletion events have been extracted. We can now join them to begin analyzing the relationship between them.
In addition to joining the tables, we have renamed the column corresponding to the moment the fluid collection for the lab value was recorded, charttime, as charttime.lab for clarity.
repEventsK %>%
inner_join(labEventsK, by=c("subject_id" = "subject_id", "hadm_id" = "hadm_id")) %>%
distinct() %>%
rename(charttime.lab = charttime) %>%
collect() -> k_lab_repletions_MV_new
k_lab_repletions_MV_new
We want to flag all repletion events that occurred either 24 hours before or 24 hours after a given lab value. We then filter the table, storing all of the repletions occurring BEFORE a given lab value in one table, and all of the ones occurring AFTER a given lab value in another.
#Find the RECENT Repletions
k_lab_repletions_MV_new %>%
mutate(charttime.lab= as_datetime(charttime.lab), endtime=as_datetime(endtime), starttime = as_datetime(starttime)) %>%
mutate(isRecentPre = difftime(starttime, charttime.lab, units = "hours") <= 24 & difftime(starttime, charttime.lab, units = "hours") > 0 ) %>%
mutate(isRecentPost = difftime(endtime, charttime.lab, units = "hours") >= -24 & difftime(endtime, charttime.lab, units = "hours") < 0 ) -> allRepLabEvents
allRepLabEvents %>%
filter(isRecentPre | isRecentPost)
We have a table that contains all of the repletion events that occur either 24 hours prior or after a given lab value. We then group the rows by each subject and hospital id, as well as the time of fluid acquisition for the lab value. Then, we create a column that generates a flag if the lab value that is chosen is the minimum starttime for all the possible starttimes. Because there are multiple lab values, as well as multiple repletion events, for a given hadm_id the table outputted has all the possible permutations. We want to select the most recent repletion AFTER a lab value, so we choose the repletion with the starttime equal to the minimum starttime for a given lab value.
#Potassium lab event PRE-repletions
allRepLabEvents %>%
filter(isRecentPre) %>%
group_by(subject_id, hadm_id,charttime.lab) %>%
mutate(isMostRecentRepletion = starttime == min(starttime)) %>%
filter(isMostRecentRepletion) %>%
ungroup() %>%
group_by(subject_id, hadm_id, starttime) %>%
mutate(isMostRecentLabEvent = charttime.lab == max(charttime.lab)) %>%
filter(isMostRecentLabEvent) %>% distinct() -> pre_k_lab_repletions_MV_new
pre_k_lab_repletions_MV_new
For the post-repletion lab values, we are now doing the same thing, but instead finding the maximum endtime prior to a given lab value, to select the most recent repletion prior to a given lab value.
#Potassium lab event POST-repletions
allRepLabEvents %>%
filter(isRecentPost) %>%
group_by(subject_id, hadm_id,charttime.lab) %>%
mutate(isMostRecentRepletion = endtime == max(endtime)) %>%
filter(isMostRecentRepletion) %>%
ungroup() %>%
group_by(subject_id, hadm_id, endtime) %>%
mutate(isMostRecentLabEvent = charttime.lab == min(charttime.lab)) %>%
filter(isMostRecentLabEvent) %>% distinct() -> post_k_lab_repletions_MV_new
post_k_lab_repletions_MV_new
We then combine all of the values from the “pre-repletion” and “post-repletion” tables, into one table. We create a new column preVsPost to indicate if a given event is either before or after a lab value. Conceivably, the same repletion could correspond to a
#Combine them into one dataset
k_pre_post_repletions_MV_new <- bind_rows(list(pre_repletion = pre_k_lab_repletions_MV_new, post_repletion = post_k_lab_repletions_MV_new), .id = "preVsPost")
k_pre_post_repletions_MV_new %>% distinct()
NA
We will now determine the set of lab values for which there was no immediate repletion afterward.
In this section, we have started by filtering all the repletions prior and after a lab value, just like for the analysis on the repletions. However, this time, if there are multiple lab values that occur before a given repletion (or after), we are taking the ones after the first one.
#Potassium lab event PRE-repletions
allRepLabEvents %>%
filter(isRecentPre) %>%
group_by(subject_id, hadm_id,charttime.lab) %>%
mutate(isMostRecentRepletion = starttime == min(starttime)) %>%
filter(isMostRecentRepletion) %>%
ungroup() %>%
group_by(subject_id, hadm_id, starttime) %>%
mutate(isMostRecentLabEvent = charttime.lab == max(charttime.lab)) %>%
filter(!isMostRecentLabEvent) %>% distinct() -> nonRepletLabsPre
#Potassium lab event POST-repletions
allRepLabEvents %>%
filter(isRecentPost) %>%
group_by(subject_id, hadm_id,charttime.lab) %>%
mutate(isMostRecentRepletion = endtime == max(endtime)) %>%
filter(isMostRecentRepletion) %>%
ungroup() %>%
group_by(subject_id, hadm_id, endtime) %>%
mutate(isMostRecentLabEvent = charttime.lab == min(charttime.lab)) %>%
filter(!isMostRecentLabEvent) %>% distinct() -> nonRepletLabsPost
allNonRepletions <- bind_rows(list(pre_repletion = nonRepletLabsPre, post_repletion = nonRepletLabsPost), .id = "preVsPost")
We now want to exclude all the rows based on certain criteria.
We have a table called hadm_id_table which contains all of the hadm_ids of patients with diagnoses that would confound our results (kidney disease, etc). (WILL ADD HOW I CREATED THIS TABLE LATER).
hadm_id_table
As a result, we could simply do a semi-join to determine how many people in each group were excluded. Note, we are doing the anti-join on the table with the most recent repletion before and after a given lab result, within a 24 hour time range. We are not doing it on the set of ALL possible repletion and or lab result events.
hadm_id_table %>%
semi_join(k_pre_post_repletions_MV_new, by = "hadm_id") %>%
select(hadm_id, .id) %>%
group_by(.id) %>%
summarize(n = n()) %>%
arrange(desc(n)) %>%
kable()
`summarise()` ungrouping output (override with `.groups` argument)
| .id | n |
|---|---|
| renal-codes | 4973 |
| afib-codes | 2954 |
| aki-codes | 2606 |
| chf-codes | 2272 |
| cad-codes | 919 |
| prbc | 457 |
| ckd-codes | 319 |
| esrd-codes | 299 |
| paralyzed-codes | 125 |
| rhabdo-codes | 114 |
| dialysis-codes | 78 |
| parathyroid-codes | 42 |
| sarcoid-codes | 33 |
| pediatrics | 16 |
| burn-codes | 9 |
| nutrit-def | 6 |
k_pre_post_repletions_MV_new %>%
ungroup()%>%
semi_join(hadm_id_table, by = "hadm_id") %>%
select(icustay_id, orderir, .id) %>%
group_by(.id) %>%
summarize(n = n()) %>%
arrange(desc(n)) %>%
kable()
Error: Can't subset columns that don't exist.
x Column `orderir` doesn't exist.
And here is the resultant dataset after actually excluding this time, using an anti-join instead.
postExclusionK_Repleted %>%
mutate(repletionRange = case_when(valuenum < 3.5 & flag == "abnormal" ~ "below normal",
flag != "abnormal" ~ "within range",
valuenum > 4.5 & flag == "abnormal" ~ "above range")) -> postExclusionsK_Repleted
Error in eval(lhs, parent, parent) :
object 'postExclusionK_Repleted' not found
###Another Exclusions
We are going to do analysis here on the dataset containing repletions. We are making this distinction, as later on, we will do analysis on non-repletions.
In this table we are just doing some summary analysis on the dataset.
postExclusionsK_Repleted %>%
group_by( preVsPost) %>%
summarize(n = n(), mean = mean(valuenum, na.rm = TRUE), standard_deviation = sd(valuenum, na.rm = T))
`summarise()` ungrouping output (override with `.groups` argument)
Histogram of Pre and Post Repletions
ggpar(gghistogram(data = postExclusionsK_Repleted, x="valuenum", fill = "preVsPost", add="mean", palette = c("#00AFBB", "#E7B800"),add_density = FALSE, bins = 40, gggtheme = theme_pubr(), xlab = "Lab Value", title = "Pre Vs Post Repletion Lab Values - Potassium", ylab = "Repletions")
, xlim = c(2,6))
ggplot(postExclusionsK_Repleted, aes(x = valuenum,fill=preVsPost)) +
geom_histogram(alpha=0.6, position="identity",bins=40, color="black") + scale_x_continuous(limits = c(2,6) ) + theme_pubr() + xlab("Potassium Value") + ylab("Number of Occurrences") + scale_fill_discrete(name = "", labels = c("Post repletion K", "Pre repletion K"))
allNonRepletions <- bind_rows(list(pre_repletion = nonRepletLabsPre, post_repletion = nonRepletLabsPost), .id = "preVsPost")
#Run Exclusions
allNonRepletions %>%
anti_join(hadm_id_table, by = "hadm_id") -> postexclusion_nonRepletions
postexclusion_nonRepletions
postexclusion_nonRepletions %>%
group_by( preVsPost) %>%
summarize(n = n(), mean = mean(valuenum, na.rm = TRUE), standard_deviation = sd(valuenum, na.rm = T))
`summarise()` ungrouping output (override with `.groups` argument)
repletedVsNonRepleted_PreV <- bind_rows(list(repleted = postExclusionsK_Repleted, nonRepleted = postexclusion_nonRepletions), .id = "repleteVsNon") %>% filter(preVsPost == "pre_repletion")
repletedVsNonRepleted_PreV %>% distinct()
#Table
repletedVsNonRepleted_PreV %>%
group_by(repleteVsNon,flag) %>%
summarize(observations = n(),mean = mean(valuenum, na.rm = T), std_dev = sd(valuenum, na.rm=T)) %>%
mutate(percentage = observations / sum(observations) * 100)
`summarise()` regrouping output by 'repleteVsNon' (override with `.groups` argument)
#Visualizing the non-repleted vs repleted lab values
ggpar(gghistogram(data = repletedVsNonRepleted_PreV, x="valuenum", fill = "flag", add="mean",position = "identity", palette = c("#00AFBB", "#E7B800"),add_density = FALSE, bins = 100, gggtheme = theme_pubr(), xlab = "Lab Value", title = "Pre Vs Post Repletion Lab Values - Potassium", ylab = "Repletions", facet.by = "repleteVsNon")
, xlim = c(2,6))
Question: How can there be histogram bars that are “abnormal” on top of bars that are white? Are they just not granular enough to differentiate them? I think there are errors in how the data was flagged. Should look more into this. #### Looking at the outliers
postexclusion_nonRepletions %>%
filter(valuenum < 3.5 & flag == "abnormal") %>%
ggplot(aes(x = valuenum)) +
geom_histogram(alpha=0.6, position="identity",bins=14, color="black") + scale_x_continuous(limits = c(1,3.5)) + theme_pubr()
postexclusion_nonRepletions %>%
filter(flag == "abnormal" & valuenum < 4) %>%
ungroup() %>%
summarize(observations = n(),mean = mean(valuenum, na.rm = T), std_dev = sd(valuenum, na.rm=T))
postexclusion_nonRepletions %>%
filter(valuenum < 3.5 & flag == "abnormal") %>%
ggplot(aes(x = valuenum)) +
geom_histogram(alpha=0.6, position="identity",bins=14, color="black") + scale_x_continuous(limits = c(1,3.5)) + theme_pubr()
###Amount of people that replete (vs Non-Replete) across lab value
repletedVsNonRepleted_PreV %>%
group_by(valuenum, repleteVsNon) %>%
summarize(observations = n() ) %>%
ggplot(aes(fill=repleteVsNon, y=observations, x=valuenum)) +
geom_bar(position="fill", stat="identity") + scale_x_continuous() + theme_pubr()
`summarise()` regrouping output by 'valuenum' (override with `.groups` argument)
Examining the time of day for each repletion and lab value.
repletedVsNonRepleted_PreV %>%
mutate(RepletionHour = hour(starttime), LabHour = hour(charttime.lab)) %>%
gghistogram(x = c("LabHour","RepletionHour"), bins = 24, palette = "uchicago", alpha = 0.5, merge = T, xlab = "Hours", ylab = "Number of Occurences")
repletedVsNonRepleted_PreV %>%
ungroup() %>%
mutate(LabHour = hour(charttime.lab) + 4, RepletionHour = hour(starttime)) %>%
pivot_longer(cols = c(LabHour,RepletionHour), values_to="Hour", names_to="WhichHour") -> yy
ordered(yy$WhichHour)
[1] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[7] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[13] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[19] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[25] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[31] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[37] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[43] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[49] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[55] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[61] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[67] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[73] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[79] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[85] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[91] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[97] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[103] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[109] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[115] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[121] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[127] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[133] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[139] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[145] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[151] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[157] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[163] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[169] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[175] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[181] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[187] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[193] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[199] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[205] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[211] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[217] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[223] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[229] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[235] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[241] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[247] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[253] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[259] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[265] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[271] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[277] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[283] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[289] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[295] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[301] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[307] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[313] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[319] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[325] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[331] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[337] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[343] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[349] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[355] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[361] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[367] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[373] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[379] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[385] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[391] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[397] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[403] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[409] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[415] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[421] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[427] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[433] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[439] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[445] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[451] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[457] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[463] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[469] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[475] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[481] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[487] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[493] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[499] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[505] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[511] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[517] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[523] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[529] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[535] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[541] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[547] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[553] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[559] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[565] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[571] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[577] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[583] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[589] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[595] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[601] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[607] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[613] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[619] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[625] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[631] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[637] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[643] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[649] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[655] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[661] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[667] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[673] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[679] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[685] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[691] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[697] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[703] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[709] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[715] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[721] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[727] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[733] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[739] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[745] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[751] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[757] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[763] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[769] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[775] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[781] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[787] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[793] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[799] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[805] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[811] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[817] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[823] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[829] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[835] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[841] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[847] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[853] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[859] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[865] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[871] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[877] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[883] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[889] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[895] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[901] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[907] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[913] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[919] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[925] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[931] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[937] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[943] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[949] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[955] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[961] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[967] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[973] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[979] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[985] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[991] LabHour RepletionHour LabHour RepletionHour LabHour RepletionHour
[997] LabHour RepletionHour LabHour RepletionHour
[ reached getOption("max.print") -- omitted 49118 entries ]
Levels: LabHour < RepletionHour
yy$WhichHour <- factor(yy$WhichHour, ordered = FALSE)
yy$WhichHour <- relevel(yy$WhichHour,"RepletionHour")
ggplot(yy, aes(x = Hour,fill=WhichHour)) + geom_histogram(position="identity",bins = 24,alpha=0.6) +
scale_x_continuous(breaks=seq(0,24,2)) + theme_pubr()
ggplot(yy, aes(x = Hour,fill=WhichHour)) +
geom_histogram(alpha=0.4, position="identity",bins=24, color="black") + scale_x_continuous(breaks=seq(0,24,2)) + facet_wrap(vars(repleteVsNon))
Below, we have the time of day for lab value draws that occur for lab values that were repleted, and those that did not directly lead to a repletion.
It seems that those leading to a repltion were more likely to occur in the morning, while those that did not directly lead to a repletion were more likely to occur in the afternoon.
Why is this occurring? Perhaps, repletions in the morning are routine, but there is no routine in performing repletions in the afternoon.
repletedVsNonRepleted_PreV %>%
ungroup() %>%
mutate(LabHour = hour(charttime.lab)) %>%
filter(preVsPost == "pre_repletion") %>%
ggplot(aes(x = LabHour,fill=repleteVsNon)) + geom_histogram(position="identity",bins = 24,alpha=0.6, color = "black") + scale_x_continuous(breaks=seq(0,24,2)) + theme_pubr() + xlab("Hour of Day") + ylab("Number of Lab Values") + scale_fill_discrete(name = "", labels = c("Non-Repletion", "Repletion"))
NA
NA
repletedVsNonRepleted_PreV %>%
ungroup() %>%
mutate(LabHour = hour(charttime.lab)) %>%
filter(preVsPost == "pre_repletion") %>%
group_by(LabHour, repleteVsNon) %>%
summarize(mean_lab_value = mean(valuenum, na.rm = T)) %>%
pivot_wider(names_from = repleteVsNon, values_from = mean_lab_value)
`summarise()` regrouping output by 'LabHour' (override with `.groups` argument)